#!/bin/bash

LLAMA_ROOT=/root/llama.cpp
MODEL_PATH=/root/llama.cpp/models/deepseek-r1-distill-qwen-1.5b-q4_0.gguf

# baseline
LD_PRELOAD=./build/lib/libgemv.so $LLAMA_ROOT/build/bin/llama-cli \
    -m $MODEL_PATH \
    -p "<｜User｜>How many letter r in word 'strawberry'?<｜Assistant｜><think>" \
    -s 20250527 \
    -ctk q8_0 \
    -no-cnv \
    -n 512